#!/usr/bin/python
# -*- coding:utf-8 -*-
from simple_html_dom import  *

pCategories={}
tmp_p=file_get_html("http://www.51voa.com/VOA_Standard_1_archiver.html")

tmpList=tmp_p.find("#list li a")
for p in tmpList:
    print(p.href,p.text())
#========================
